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INTRODUCTION 

The  C++  developers  are  well  aware  of  how  useful  std::strings  +=  and  +  operators  are  but  not 
always  aware  of  which  one  is  more  efficient  and  in  turn  better  to  use.  The  +  operator  may  provide 
the  coder  the  ability  to  put  more  code  on  a  single  line,  but  it  turns  out  that  the  assembly  code 
produced  is  far  less  efficient. 


METHODOLOGY 

In  order  to  acquire  data  for  this  report,  a  program  was  written  that  would  concatenate  strings 
using  the  +=  operator  and  also  concatenate  the  same  two  strings  using  the  +  operator.  Data  was 
collected  for  concatenating  2  to  10  strings.  The  source  code  for  this  program  is  shown  in  the 
following  sequence: 

int_tmain(int  argc,  _TCHAR*  argv[]) 

{ 

LARGEJNTEGER  frequency; 

QueryPerformanceFrequency(&frequency); 

LARGEJNTEGER  starting_time,  endingjime,  elapsed_microseconds; 

//std::ofstream  a_file("outfile2.txt"); 

//std::ofstream  a_file("outfile3.txt"); 

//std::ofstream  a_file("outfile4.txt"); 

//std::ofstream  a_file("outfile5.txt"); 

//std::ofstream  a_file("outfile6.txt"); 

//std::ofstream  a_file("outfile7.txt"); 

//std::ofstream  a_file("outfile8.txt"); 

//std::ofstream  a_file("outfile9.txt"); 
std::ofstream  a_file("outfilel0.txt"); 


//setup  strings  here 
std :  :vector<std :  :string>  my_stri ngs; 
my_strings.push_back("This  is  the  first.'1); 
my_strings.push_back("This  is  the  second."); 
my_strings.push_back("This  is  the  third."); 
my_strings.push_back("This  is  the  fourth."); 
my_strings.push_back("This  is  the  fifth.’1); 
my_strings.push_back("This  is  the  sixth.'1); 
my_strings.push_back("This  is  the  seventh."); 
my_strings.push_back("This  is  the  eighth."); 
my_strings.push_back("This  is  the  nineth."); 
my_strings.push_back("This  is  the  tenth."); 

std -string  plus_equal; 
std -string  plus_plus; 

for(auto  i  =  Ou;  i  <  10;  ++i) 

{ 

plus_equal  = ""; 

QueryPerformanceCounter(&starting_time); 

//code  to  measure  here 
plus_equal  =  my_strings[0]; 
plus_equal  +=  my_strings[l); 
plus_equal  +=  my_strings[2); 
plus_equal  +=  my_strings[3]; 
plus_equal  +=  my_strings[4]; 
plus_equal  +=  my_strings[5]; 
plus_equal  +=  my_strings[6]; 
plus_equal  +=  my_strings[7); 
plus_equal  +=  my_strings[8]; 
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plus_equal  +=  my_strings[9]; 

QueryPerformanceCounter(&ending_time); 

elapsed_microseconds.QuadPart  =  ending_time.QuadPart  -  starting_time.QuadPart; 

//this  time  is  in  micro  seconds 

auto  te_plus_equal  =  static_cast<double>((elapsed_microseconds.QuadPart  *  1000000.0)  /  frequency.QuadPart); 


plus_plus  = 

QueryPerformanceCounter(&starting_time); 

//code  to  measure  here 

//plus_plus  =  my_strings[0]  +  my_strings[l]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]  +  my_strings[5]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]  +  my_strings[5]  +  my_strings[6]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]  +  my_strings[5]  +  my_strings[6]  + 

my_strings[7]; 

//plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]  +  my_strings[5]  +  my_strings[6]  + 
my_strings[7]  +  my_strings[8]; 

plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]  +  my_strings[3]  +  my_strings[4]  +  my_strings[5]  +  my_strings[6]  + 
my_strings[7]  +  my_strings[8]  +  my_strings[9]; 

QueryPerformanceCounter(&ending_time); 

elapsed_microseconds.QuadPart  =  ending_time.QuadPart  -  starting_time.QuadPart; 

//this  time  is  in  micro  seconds 

auto  te_plus_plus  =  static_cast<double>((elapsed_microseconds.QuadPart  *  1000000.0)  /  frequency.QuadPart); 


a_file  « te_plus_equal  «  «  te_plus_plus  «  "\r\n"; 


printf("Run:  %d  \t\tte  plus  equal:  %4.2f  \t\tte  plus  plus:  %4.2f\r\n",  i  +  1,  te_plus_equal,  te_plus_plus); 

} 

a_file.close(); 
printff'AII  done!\n"); 

//this  stops  the  program  in  order  to  see  data; 
getchar(); 

return  0; 

} 

The  code  is  very  straightforward.  Sections  need  to  be  commented  out  depending  on  the 
results  that  are  desired.  The  built-in,  high-resolution  counters  are  used  in  order  to  measure  how  long 
a  snippet  of  code  took.  The  results  are  logged  to  the  output  file  for  later  processing. 

After  running  this  program  for  each  of  the  results  desired,  the  results  are  shown  in  figure  1. 
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Figure  1 

std::string  append  measurements 

Figure  1  clearly  shows  that  the  time  needed  to  append  two  std::strings  using  the  +  operator 
takes  significantly  longer  than  the  +=  operator. 

Let’s  take  a  look  at  look  at  the  compiler  generated  assembly  code  in  order  to  get  a  better  idea 
of  why  the  measured  results  were  received.  For  appending  three  std::strings,  the  assembly  code  is 
as  follows: 


plus_equal  =  my_strings[0]; 

00C2E39A  push  0 

00C2E39C  lea  ecx,  [my_strings] 

00C2E3A2  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 

std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E3A7  push  eax 

00C2E3A8  lea  ecx,  [plus_equal] 

00C2E3AE  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::operator=  (OC212BCh) 

plus_equal  +=  my_strings[l]; 

00C2E3B3  push  1 
plus_equal  +=  my_strings[l]; 

00C2E3B5  lea  ecx,  [my_strings] 

00C2E3BB  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 

std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E3C0  push  eax 

00C2E3C1  lea  ecx,  [plus_equal] 

00C2E3C7  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::operator+=  (0C21217h) 

plus_equal  +=  my_strings[2]; 

OOC2E3CC  push  2 
00C2E3CE  lea  ecx,  [my_strings] 

00C2E3D4  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 

std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E3D9  push  eax 

00C2E3DA  lea  ecx,  [plus_equal] 

00C2E3E0  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::operator+=  (0C21217h) 

18  instructions 
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plus_plus  =  my_strings[0]  +  my_strings[l]  +  my_strings[2]; 

00C2E467  push  2 
00C2E469  lea  ecx,  [my_strings] 

00C2E46F  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 
std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E474  push  eax 

00C2E475  push  1 

00C2E477  lea  ecx,  [my_strings] 

00C2E47D  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 

std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E4S2  push  eax 

00C2E483  push  0 

00C2E485  lea  ecx,  [my_strings] 

00C2E48B  call  std::vector<std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >,  std::allocator<std::basic_string<char, 

std::char_traits<char>,  std::allocator<char>  >  >  >::operator[]  (0C21014h) 

00C2E490  push  eax 
00C2E491  lea  eax,  [ebp  -  290h] 

00C2E497  push  eax 

00C2E498  call  std::operator+<char,  std::char_traits<char>,  std::allocator<char>  >  (0C216C7h) 

00C2E49D  add  esp,  OCh 

00C2E4A0  mov  dword  ptr[ebp  -  40Ch],  eax 

00C2E4A6  mov  ecx,  dword  ptr[ebp  -  40Ch] 

00C2E4AC  mov  dword  ptr[ebp  -  410h],  ecx 
00C2E4B2  mov  byte  ptr[ebp  -  4],  OEh 
00C2E4B6  mov  edx,  dword  ptr[ebp  -  410h] 

00C2E4BC  push  edx 

00C2E4BD  lea  eax,  [ebp  -  26Ch] 

00C2E4C3  push  eax 

00C2E4C4  call  std::operator+<char,  std::char_traits<char>,  std::allocator<char>  >  (0C211AEh) 

00C2E4C9  add  esp,  OCh 

00C2E4CC  mov  dword  ptr[ebp  -  414h],  eax 

00C2E4D2  mov  ecx,  dword  ptr[ebp  -  414h] 

00C2E4D8  push  ecx 

00C2E4D9  lea  ecx,  [plus_plus] 

00C2E4DF  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::operator=  (0C217A8h) 

00C2E4E4  lea  ecx,  [ebp  -  26Ch] 

00C2E4EA  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::~basic_string<char,  std::char_traits<char>, 
std::allocator<char>  >(0C2164Fh) 

00C2E4EF  mov  byte  ptr[ebp  -  4],  ODh 

00C2E4F3  lea  ecx,  [ebp  -  290h] 

00C2E4F9  call  std::basic_string<char,  std::char_traits<char>,  std::allocator<char>  >::~basic_string<char,  std::char_traits<char>, 
std::allocator<char>  >(0C2164Fh) 

36  instructions 

The  +=  append  only  created  18  lines  of  machine  code  versus  the  36  lines  of  machine  code 
generated  by  the  +  operator.  So  just  by  the  number  of  instructions  created,  one  can  see  that  the 
+  operator  will  take  longer.  Looking  deeper  into  the  assembly,  it  can  be  seen  that  the  +  operator  is 
returning  a  new  buffer  for  each  +,  whereas  the  +=  operator  is  doing  an  actual  concatenation. 


CONCLUSIONS 

It’s  very  important  for  a  developer  to  understand  the  complexities  of  writing  code  in  one  way 
versus  another.  This  report  clearly  shows  that  the  more  efficient  way  to  append  std::strings  is  to  use 
the  +=  operator. 
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